import codecs
from lxml import etree

a=codecs.open("test.html","r","utf-8")
content=a.read()
a.close()
tree=etree.HTML(content)
nodes=tree.xpath('//p[2]')[0]
aa=len(nodes)
if aa > 0:
    for i in nodes:
        print i.xpath('string()')
	
else:
        print nodes.xpath('string()')

# for i in nodes:
    # print i
	
	
	